package www.wmx.com.xssc.util.similarity;

import cn.hutool.core.io.FileUtil;
import org.apache.tika.exception.TikaException;
import org.springframework.stereotype.Service;
import org.xml.sax.SAXException;

import java.io.File;
import java.io.IOException;



public class CharacterCounter {

    public static int getCharNum(String content) {
        String cleanText = content.replaceAll("[\\s\\p{Punct}、，。？！；：“”‘’【】（）《》]+", "");
        return cleanText.length();
    }



}